# configuration\_files/BOOMV3\_PIM/processor\_PIM.cfg //========RVV BIGGER LOADS======== // 0 -> Disabled // N -> Number of bytes loaded by the first of a vector load SIMULATED\_VECTOR\_LOAD\_SIZE = x; //========RVV BIGGER LOADS=========

Alteração/Solução: Ao invés de enviar um prefetch avulso, a primeira instrução que dá MISS vira um prefetch.

## processor\_t

// Minimum number of bytes loaded by each first vector load;
// Default is 0
uint32\_t SIMULATED\_VECTOR\_LOAD\_SIZE;

INSTANTIATE\_GET\_SET\_ADD (uint32\_t, SIMULATED\_VECTOR\_LOAD\_SIZE)

bool is\_vector\_insn(opcode\_package\_t \*);

#### processor\_t::allocate()

// libconfig::Setting &cfg\_root = orcs\_engine.configuration->getConfig();
// libconfig::Setting &cfg\_processor = cfg\_root["PROCESSOR"][0];
if (cfg\_processor.exists("SIMULATED\_VECTOR\_LOAD\_SIZE"))
 set\_SIMULATED\_VECTOR\_LOAD\_SIZE(cfg\_processor["SIMULATED\_VECTOR\_LOAD\_SIZE"]);
else
 set\_SIMULATED\_VECTOR\_LOAD\_SIZE(0);

## processor\_t::rename()

// Adicionar
for (uint32\_t r = 0; r < rob\_line->uop.num\_mem\_operations; ++r)

uint32\_t pos = (pos\_mob + r) % MOB\_LIMIT; rob\_line->mob\_base[pos].is\_first\_of\_vector\_load = ((r == 0) && rob\_line->uop.is\_vector\_insn);

## cache\_manager\_t::process()

// Em:
} else if (!request->sent\_to\_ram) {
 <AQUI>

Adicionar:

// Check if its the first load request from RVV

if (((memory\_order\_buffer\_line\_t \*)request->clients[0])->is\_first\_of\_vector\_load) {

// Change the request memory\_size

request->memory\_size = (request->memory\_size < SIMULATED\_VECTOR\_LOAD\_SIZE) ?

SIMULATED\_VECTOR\_LOAD\_SIZE : request->memory\_size;

memory\_order\_buffer\_line\_t

memory\_order\_buffer\_line\_t::package\_clean()

bool is\_first\_of\_vector\_load;

this->is\_first\_of\_vector\_load = false;

# processor\_t::is\_vector\_insn(opcode\_package\_t \*insn)

// Deve verificar se o opcode\_assembly começa com v
if (insn->opcode\_assembly[0] == 'v') return true;
return false;

Alerta: Isso foi planejado para um processador in-order.

Problema: Se mais requisições forem feitas em paralelo, elas podem não aproveitar a expandida (já que a verificação do MSHR já passou quando ela é gerada).

uop\_package\_t

bool is\_vector\_insn;

opcode\_package\_t
...
bool is\_vector\_insn;

uop\_package\_t::opcode\_to\_uop(...)
...
this->is\_vector\_insn = opcode.is\_vector\_insn;

processor\_t::fetch(...)